- Notifications
You must be signed in to change notification settings - Fork 251
/
Copy pathBoston_Spyder.py
46 lines (36 loc) · 1.15 KB
/
Boston_Spyder.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
#-*- coding:utf-8 -*-
# &Author AnFany
frombs4importBeautifulSoupasbs
importurllib
html=urllib.request.urlopen("http://lib.stat.cmu.edu/datasets/boston")
bsObj=bs(html.read(), "html5lib")
namest=str(bsObj.body.get_text())
sign=0
name= []
forhhinnamest.split('\n'):
if6<sign<21:
#获取字段名字
name.append(hh[:7].replace(' ',''))
ifsign==21:
fornaminname:
exec('%s = []'%nam)
ifsign>21:
#获得字段对应的数据
datalist= [datafordatainhh.split(' ') ifdata!='']
ifsign%2==0:
foriinrange(len(datalist)):
eval(name[i]).append(datalist[i])
else:
foriinrange(len(datalist)):
eval(name[11+i]).append(datalist[i])
sign+=1
#有序的字典形式,按添加的序列输出
fromcollectionsimportOrderedDict
datadict=OrderedDict({})
forkeynameinname:
datadict[keyname] =eval(keyname)
#写入文件
importpandasaspd
df=pd.DataFrame(datadict)
df.to_csv(r'C:\Users\GWT9\Desktop\Boston.csv', index=False)
print('完毕')